1 package org.apache.lucene.index;
2
3 /*
4 * Licensed to the Apache Software Foundation (ASF) under one or more
5 * contributor license agreements. See the NOTICE file distributed with
6 * this work for additional information regarding copyright ownership.
7 * The ASF licenses this file to You under the Apache License, Version 2.0
8 * (the "License"); you may not use this file except in compliance with
9 * the License. You may obtain a copy of the License at
10 *
11 * http://www.apache.org/licenses/LICENSE-2.0
12 *
13 * Unless required by applicable law or agreed to in writing, software
14 * distributed under the License is distributed on an "AS IS" BASIS,
15 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
16 * See the License for the specific language governing permissions and
17 * limitations under the License.
18 */
19
20 import org.apache.lucene.util.Version;
21
22 import java.io.IOException;
23 import java.util.ArrayList;
24 import java.util.List;
25 import java.util.Map;
26 import java.util.HashMap;
27
28 /** This {@link MergePolicy} is used for upgrading all existing segments of
29 * an index when calling {@link IndexWriter#forceMerge(int)}.
30 * All other methods delegate to the base {@code MergePolicy} given to the constructor.
31 * This allows for an as-cheap-as possible upgrade of an older index by only upgrading segments that
32 * are created by previous Lucene versions. forceMerge does no longer really merge;
33 * it is just used to "forceMerge" older segment versions away.
34 * <p>In general one would use {@link IndexUpgrader}, but for a fully customizeable upgrade,
35 * you can use this like any other {@code MergePolicy} and call {@link IndexWriter#forceMerge(int)}:
36 * <pre class="prettyprint lang-java">
37 * IndexWriterConfig iwc = new IndexWriterConfig(Version.LUCENE_XX, new KeywordAnalyzer());
38 * iwc.setMergePolicy(new UpgradeIndexMergePolicy(iwc.getMergePolicy()));
39 * IndexWriter w = new IndexWriter(dir, iwc);
40 * w.forceMerge(1);
41 * w.close();
42 * </pre>
43 * <p><b>Warning:</b> This merge policy may reorder documents if the index was partially
44 * upgraded before calling forceMerge (e.g., documents were added). If your application relies
45 * on "monotonicity" of doc IDs (which means that the order in which the documents
46 * were added to the index is preserved), do a forceMerge(1) instead. Please note, the
47 * delegate {@code MergePolicy} may also reorder documents.
48 * @lucene.experimental
49 * @see IndexUpgrader
50 */
51 public class UpgradeIndexMergePolicy extends MergePolicy {
52
53 /** Wrapped {@link MergePolicy}. */
54 protected final MergePolicy base;
55
56 /** Wrap the given {@link MergePolicy} and intercept forceMerge requests to
57 * only upgrade segments written with previous Lucene versions. */
58 public UpgradeIndexMergePolicy(MergePolicy base) {
59 this.base = base;
60 }
61
62 /** Returns if the given segment should be upgraded. The default implementation
63 * will return {@code !Version.LATEST.equals(si.getVersion())},
64 * so all segments created with a different version number than this Lucene version will
65 * get upgraded.
66 */
67 protected boolean shouldUpgradeSegment(SegmentCommitInfo si) {
68 return !Version.LATEST.equals(si.info.getVersion());
69 }
70
71 @Override
72 public MergeSpecification findMerges(MergeTrigger mergeTrigger, SegmentInfos segmentInfos, IndexWriter writer) throws IOException {
73 return base.findMerges(null, segmentInfos, writer);
74 }
75
76 @Override
77 public MergeSpecification findForcedMerges(SegmentInfos segmentInfos, int maxSegmentCount, Map<SegmentCommitInfo,Boolean> segmentsToMerge, IndexWriter writer) throws IOException {
78 // first find all old segments
79 final Map<SegmentCommitInfo,Boolean> oldSegments = new HashMap<>();
80 for (final SegmentCommitInfo si : segmentInfos) {
81 final Boolean v = segmentsToMerge.get(si);
82 if (v != null && shouldUpgradeSegment(si)) {
83 oldSegments.put(si, v);
84 }
85 }
86
87 if (verbose(writer)) {
88 message("findForcedMerges: segmentsToUpgrade=" + oldSegments, writer);
89 }
90
91 if (oldSegments.isEmpty())
92 return null;
93
94 MergeSpecification spec = base.findForcedMerges(segmentInfos, maxSegmentCount, oldSegments, writer);
95
96 if (spec != null) {
97 // remove all segments that are in merge specification from oldSegments,
98 // the resulting set contains all segments that are left over
99 // and will be merged to one additional segment:
100 for (final OneMerge om : spec.merges) {
101 oldSegments.keySet().removeAll(om.segments);
102 }
103 }
104
105 if (!oldSegments.isEmpty()) {
106 if (verbose(writer)) {
107 message("findForcedMerges: " + base.getClass().getSimpleName() +
108 " does not want to merge all old segments, merge remaining ones into new segment: " + oldSegments, writer);
109 }
110 final List<SegmentCommitInfo> newInfos = new ArrayList<>();
111 for (final SegmentCommitInfo si : segmentInfos) {
112 if (oldSegments.containsKey(si)) {
113 newInfos.add(si);
114 }
115 }
116 // add the final merge
117 if (spec == null) {
118 spec = new MergeSpecification();
119 }
120 spec.add(new OneMerge(newInfos));
121 }
122
123 return spec;
124 }
125
126 @Override
127 public MergeSpecification findForcedDeletesMerges(SegmentInfos segmentInfos, IndexWriter writer) throws IOException {
128 return base.findForcedDeletesMerges(segmentInfos, writer);
129 }
130
131 @Override
132 public boolean useCompoundFile(SegmentInfos segments, SegmentCommitInfo newSegment, IndexWriter writer) throws IOException {
133 return base.useCompoundFile(segments, newSegment, writer);
134 }
135
136 @Override
137 public String toString() {
138 return "[" + getClass().getSimpleName() + "->" + base + "]";
139 }
140
141 private boolean verbose(IndexWriter writer) {
142 return writer != null && writer.infoStream.isEnabled("UPGMP");
143 }
144
145 private void message(String message, IndexWriter writer) {
146 writer.infoStream.message("UPGMP", message);
147 }
148 }